Packages

Case studies

Load data

per lemma

Comparative analyses

Filtering

specific lemmas

# cowork # snowflake # data after 2018-12-31 # frequency threshhold # edges threshhold

Check tweets

tweets %>%
  select(tweet, date) %>%
  slice(., sample(1:n()))

Usage intensity

uses <- get_uses(tweets)
uses_tot <- get_uses_tot(uses)
age = get_age(uses)
coef_var <- get_coef_var(uses)
mean_date <- get_mean_date(uses)
max_date <- get_max_date(uses)
uses_month <- conv_uses_month(uses)
uses_plt <- plt_uses(uses_month, lemma, mean_date, max_date)
ggplotly(uses_plt)
`geom_smooth()` using method = 'loess' and formula 'y ~ x'

Degree centralization

Diachronic

df_comp %>%
  filter(LEMMA == lemma) %>%
  select(SUBSET, CENT_DEGREE) %>%
  mutate(SUBSET = factor(SUBSET, levels=c('first', 'mean', 'max', 'last', 'full'))) %>%
  ggplot(., aes(x=SUBSET, y=CENT_DEGREE, group=1)) +
    geom_point() +
    geom_line()

Comparative analyses

Degree centrality

Overall

List

df_comp %>%
  select(LEMMA, SUBSET, USES, CENT_DEGREE) %>%
  filter(
    SUBSET == 'full',
    # USES >= 10000
    ) %>%
  arrange((CENT_DEGREE))

Plot

plt <- df_comp %>%
  select(LEMMA, SUBSET, USES, CENT_DEGREE) %>%
  filter(SUBSET == 'full') %>%
  arrange((CENT_DEGREE)) %>%
  ggplot(., aes(x=CENT_DEGREE, y=reorder(LEMMA, CENT_DEGREE))) +
    geom_point() +
    scale_x_continuous(trans='log')
ggplotly(plt)

Over time

Across all lemmas

df_comp %>%
  filter(
    SUBSET != 'full',
    EDGES >= 100
    ) %>%
  group_by(SUBSET) %>%
  summarize(CENT_AVG = mean(CENT_DEGREE)) %>%
  mutate(SUBSET = factor(SUBSET, levels=c('first', 'mean', 'max', 'last'))) %>%
  ggplot(., aes(x=SUBSET, y=CENT_AVG, group=1)) +
    geom_point() +
    geom_line()

Biggest changes

df_comp %>%
  select(LEMMA, SUBSET, CENT_DEGREE, EDGES) %>%
  filter(
    SUBSET %in% c('first', 'last'),
    EDGES >= 100
    ) %>%
  dplyr::group_by(LEMMA) %>%
  dplyr::mutate(CENT_DIFF = lag(CENT_DEGREE) - CENT_DEGREE) %>%
  drop_na() %>%
  select(-SUBSET) %>%
  rename(
    CENT_LAST = CENT_DEGREE,
    EDGES_LAST = EDGES
    ) %>%
  arrange(desc(CENT_DIFF))

Usage intensity

Usage intensity vs. network characteristics

Uses vs. degree centralization

Plot

plt <- df_comp %>%
  filter(
    SUBSET == 'full',
    # USES >= 1000
    ) %>%
  select(LEMMA, CENT_DEGREE, USES, EDGES) %>%
  ggplot(., aes(x=CENT_DEGREE, y=USES)) +
    geom_text(aes(label=LEMMA)) + 
    scale_y_continuous(trans='log') +
    scale_x_continuous(trans='log') +
    geom_smooth(method=lm)
ggplotly(plt)

Correlation

df_corr_full <- df_comp %>%
  filter(
    SUBSET != 'full',
    EDGES >= 100
    ) %>%
  select(-c(LEMMA, SUBSET, NET_WINDOW_DATES, SKIP, STAMP, NROWS))
  
cor.test(df_corr_full$USES, df_corr_full$CENT_DEGREE)

Degree centrality vs. communities

Correlation

df_comp %>%
  filter(SUBSET == 'last') %>%
  select(CENT_DEGREE, COMMUNITIES) %>%
  mutate(COMMUNITIES = as.numeric(COMMUNITIES)) %>%
  correlate()

Plot

df_comp %>%
  filter(SUBSET == 'last') %>%
  select(LEMMA, CENT_DEGREE, COMMUNITIES) %>%
  ggplot(., aes(x=CENT_DEGREE, y=as.numeric(COMMUNITIES))) +
    geom_text(aes(label=LEMMA)) +
    scale_x_continuous(trans='log')

Uses vs. users

Plot

plt <- df_comp %>%
  filter(SUBSET == 'full') %>%
  select(LEMMA, USES, USERS) %>%
  ggplot(., aes(x=USERS, y=USES)) +
    geom_text(aes(label=LEMMA)) +
    scale_x_continuous(trans='log') +
    scale_y_continuous(trans='log') +
    geom_smooth(method=lm)
ggplotly(plt)

Correlation

df_comp %>%
  filter(SUBSET == 'full') %>%
  select(USES, USERS) %>%
  correlate()

Coefficient of variation

df_comp %>%
  filter(
    SUBSET == 'full',
    USES >= 1000
    ) %>%
  select(LEMMA, USES, COEF_VAR) %>%
  arrange(desc(COEF_VAR))

Processing status

Lemma list

df_comp %>%
  select(LEMMA, SUBSET, STAMP) %>%
  filter(SUBSET == 'full') %>%
  mutate(STAMP = as_datetime(STAMP)) %>%
  arrange(desc(STAMP))

Dataset statistics

df_comp %>%
  filter(SUBSET == 'full') %>%
  select(LEMMA, SUBSET, USES, USERS) %>%
  dplyr::summarise(
    USES_TOT = sum(USES),
    USERS_TOT = sum(USERS)
    )

COEF_VAR vs. CENT

df_comp %>%
  filter(SUBSET == 'full') %>%
  select(LEMMA, COEF_VAR, CENT_DEGREE) %>%
  ggplot(., aes(y=COEF_VAR, x=CENT_DEGREE)) +
    geom_text(aes(label=LEMMA)) +
    scale_y_continuous(trans='log')

Correlations: EDA

library(Hmisc)

df_corr <- df_comp %>%
  # filter(SUBSET == 'last') %>%
  select(-c(LEMMA, SUBSET, NET_WINDOW_DATES, SKIP, STAMP, NROWS))
  # select(-c(USERS, AGE)) %>%
  # mutate(FOCUS = USES) %>%
  # focus(FOCUS) %>%
  # ggplot(., aes(reorder(rowname, FOCUS), FOCUS)) +
    # geom_col() +
    # coord_flip()
  # rearrange() %>%
  # shave() %>%
  # rplot()
  # network_plot(min_cor=.5) %>%

  
LS0tCmF1dGhvcjogJ1F1aXJpbiBXw7xyc2NoaW5nZXInCnRpdGxlOiAiU29jaWFsIG5ldHdvcmtzIG9mIGxleGljYWwgaW5ub3ZhdGlvbiIKb3V0cHV0OiAKICBodG1sX25vdGVib29rOiAKICAgIHRvYzogeWVzCi0tLQoKIyBQYWNrYWdlcwoKYGBge3IgaW5jbHVkZT1GQUxTRX0Kc291cmNlKCdzcmMvbG9hZC1kYXRhLlInKQpzb3VyY2UoJ3NyYy9wb3N0cHJvYy5SJykKc291cmNlKCdzcmMvdXNlcy5SJykKc291cmNlKCdzcmMvdXNlcnMuUicpCnNvdXJjZSgnc3JjL3NuYS5SJykKCmxpYnJhcnkoY29ycnIpCmxpYnJhcnkodGlkeXIpCmBgYAoKIyBDYXNlIHN0dWRpZXMKCiMjIExvYWQgZGF0YQoKIyMjIHBlciBsZW1tYQoKYGBge3IgaW5jbHVkZT1GQUxTRX0KY29ycHVzIDwtICcvVm9sdW1lcy9xamQvdHdpbnQvJwpsZW1tYSA8LSAnYmlnIGRpY2sgZW5lcmd5JwoKdHdlZXRzIDwtIGxvYWRfZGF0YShjb3JwdXMsIGxlbW1hKQp0d2VldHMgPC0gcG9zdHByb2ModHdlZXRzKQpgYGAKCiMjIyBDb21wYXJhdGl2ZSBhbmFseXNlcwoKYGBge3IgaW5jbHVkZT1GQUxTRX0KaWYgKGV4aXN0cygnZGZfY29tcCcpID09IEZBTFNFKSB7CiAgZGZfY29tcCA8LSByZWFkX2Nzdignb3V0L2RmX2NvbXAuY3N2JykKfQpgYGAKCgojIyMjIEZpbHRlcmluZwoKIyBzcGVjaWZpYyBsZW1tYXMKICAjIGNvd29yawogICMgc25vd2ZsYWtlCiMgZGF0YSBhZnRlciAyMDE4LTEyLTMxCiMgZnJlcXVlbmN5IHRocmVzaGhvbGQKIyBlZGdlcyB0aHJlc2hob2xkCgoKIyMgQ2hlY2sgdHdlZXRzCgpgYGB7cn0KdHdlZXRzICU+JQogIHNlbGVjdCh0d2VldCwgZGF0ZSkgJT4lCiAgc2xpY2UoLiwgc2FtcGxlKDE6bigpKSkKYGBgCgoKIyMgVXNhZ2UgaW50ZW5zaXR5CgpgYGB7cn0KdXNlcyA8LSBnZXRfdXNlcyh0d2VldHMpCnVzZXNfdG90IDwtIGdldF91c2VzX3RvdCh1c2VzKQphZ2UgPSBnZXRfYWdlKHVzZXMpCmNvZWZfdmFyIDwtIGdldF9jb2VmX3Zhcih1c2VzKQptZWFuX2RhdGUgPC0gZ2V0X21lYW5fZGF0ZSh1c2VzKQptYXhfZGF0ZSA8LSBnZXRfbWF4X2RhdGUodXNlcykKdXNlc19tb250aCA8LSBjb252X3VzZXNfbW9udGgodXNlcykKdXNlc19wbHQgPC0gcGx0X3VzZXModXNlc19tb250aCwgbGVtbWEsIG1lYW5fZGF0ZSwgbWF4X2RhdGUpCmdncGxvdGx5KHVzZXNfcGx0KQpgYGAKCgojIyBEZWdyZWUgY2VudHJhbGl6YXRpb24KCiMjIyBEaWFjaHJvbmljCgpgYGB7cn0KZGZfY29tcCAlPiUKICBmaWx0ZXIoTEVNTUEgPT0gbGVtbWEpICU+JQogIHNlbGVjdChTVUJTRVQsIENFTlRfREVHUkVFKSAlPiUKICBtdXRhdGUoU1VCU0VUID0gZmFjdG9yKFNVQlNFVCwgbGV2ZWxzPWMoJ2ZpcnN0JywgJ21lYW4nLCAnbWF4JywgJ2xhc3QnLCAnZnVsbCcpKSkgJT4lCiAgZ2dwbG90KC4sIGFlcyh4PVNVQlNFVCwgeT1DRU5UX0RFR1JFRSwgZ3JvdXA9MSkpICsKICAgIGdlb21fcG9pbnQoKSArCiAgICBnZW9tX2xpbmUoKQpgYGAKCgojIENvbXBhcmF0aXZlIGFuYWx5c2VzCgoKIyMgRGVncmVlIGNlbnRyYWxpdHkKCgojIyMgT3ZlcmFsbAoKIyMjIyBMaXN0CgpgYGB7cn0KZGZfY29tcCAlPiUKICBzZWxlY3QoTEVNTUEsIFNVQlNFVCwgVVNFUywgQ0VOVF9ERUdSRUUpICU+JQogIGZpbHRlcigKICAgIFNVQlNFVCA9PSAnZnVsbCcsCiAgICAjIFVTRVMgPj0gMTAwMDAKICAgICkgJT4lCiAgYXJyYW5nZSgoQ0VOVF9ERUdSRUUpKQpgYGAKCgojIyMjIFBsb3QKCmBgYHtyfQpwbHQgPC0gZGZfY29tcCAlPiUKICBzZWxlY3QoTEVNTUEsIFNVQlNFVCwgVVNFUywgQ0VOVF9ERUdSRUUpICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2Z1bGwnKSAlPiUKICBhcnJhbmdlKChDRU5UX0RFR1JFRSkpICU+JQogIGdncGxvdCguLCBhZXMoeD1DRU5UX0RFR1JFRSwgeT1yZW9yZGVyKExFTU1BLCBDRU5UX0RFR1JFRSkpKSArCiAgICBnZW9tX3BvaW50KCkgKwogICAgc2NhbGVfeF9jb250aW51b3VzKHRyYW5zPSdsb2cnKQpnZ3Bsb3RseShwbHQpCmBgYAoKCiMjIyBPdmVyIHRpbWUKCiMjIyMgQWNyb3NzIGFsbCBsZW1tYXMKCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcigKICAgIFNVQlNFVCAhPSAnZnVsbCcsCiAgICBFREdFUyA+PSAxMDAKICAgICkgJT4lCiAgZ3JvdXBfYnkoU1VCU0VUKSAlPiUKICBzdW1tYXJpemUoQ0VOVF9BVkcgPSBtZWFuKENFTlRfREVHUkVFKSkgJT4lCiAgbXV0YXRlKFNVQlNFVCA9IGZhY3RvcihTVUJTRVQsIGxldmVscz1jKCdmaXJzdCcsICdtZWFuJywgJ21heCcsICdsYXN0JykpKSAlPiUKICBnZ3Bsb3QoLiwgYWVzKHg9U1VCU0VULCB5PUNFTlRfQVZHLCBncm91cD0xKSkgKwogICAgZ2VvbV9wb2ludCgpICsKICAgIGdlb21fbGluZSgpCmBgYAoKCiMjIyMgQmlnZ2VzdCBjaGFuZ2VzCgpgYGB7cn0KZGZfY29tcCAlPiUKICBzZWxlY3QoTEVNTUEsIFNVQlNFVCwgQ0VOVF9ERUdSRUUsIEVER0VTKSAlPiUKICBmaWx0ZXIoCiAgICBTVUJTRVQgJWluJSBjKCdmaXJzdCcsICdsYXN0JyksCiAgICBFREdFUyA+PSAxMDAKICAgICkgJT4lCiAgZHBseXI6Omdyb3VwX2J5KExFTU1BKSAlPiUKICBkcGx5cjo6bXV0YXRlKENFTlRfRElGRiA9IGxhZyhDRU5UX0RFR1JFRSkgLSBDRU5UX0RFR1JFRSkgJT4lCiAgZHJvcF9uYSgpICU+JQogIHNlbGVjdCgtU1VCU0VUKSAlPiUKICByZW5hbWUoCiAgICBDRU5UX0xBU1QgPSBDRU5UX0RFR1JFRSwKICAgIEVER0VTX0xBU1QgPSBFREdFUwogICAgKSAlPiUKICBhcnJhbmdlKGRlc2MoQ0VOVF9ESUZGKSkKYGBgCgoKIyBVc2FnZSBpbnRlbnNpdHkKCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2Z1bGwnKSAlPiUKICBhcnJhbmdlKGRlc2MoVVNFUykpCmBgYAoKCgojIFVzYWdlIGludGVuc2l0eSB2cy4gbmV0d29yayBjaGFyYWN0ZXJpc3RpY3MKCiMjIFVzZXMgdnMuIGRlZ3JlZSBjZW50cmFsaXphdGlvbgoKIyMjIFBsb3QKCmBgYHtyfQpwbHQgPC0gZGZfY29tcCAlPiUKICBmaWx0ZXIoCiAgICBTVUJTRVQgPT0gJ2Z1bGwnLAogICAgIyBVU0VTID49IDEwMDAKICAgICkgJT4lCiAgc2VsZWN0KExFTU1BLCBDRU5UX0RFR1JFRSwgVVNFUywgRURHRVMpICU+JQogIGdncGxvdCguLCBhZXMoeD1DRU5UX0RFR1JFRSwgeT1VU0VTKSkgKwogICAgZ2VvbV90ZXh0KGFlcyhsYWJlbD1MRU1NQSkpICsgCiAgICBzY2FsZV95X2NvbnRpbnVvdXModHJhbnM9J2xvZycpICsKICAgIHNjYWxlX3hfY29udGludW91cyh0cmFucz0nbG9nJykgKwogICAgZ2VvbV9zbW9vdGgobWV0aG9kPWxtKQpnZ3Bsb3RseShwbHQpCmBgYAoKIyMjIENvcnJlbGF0aW9uCgpgYGB7cn0KZGZfY29ycl9mdWxsIDwtIGRmX2NvbXAgJT4lCiAgZmlsdGVyKAogICAgU1VCU0VUICE9ICdmdWxsJywKICAgIEVER0VTID49IDEwMAogICAgKSAlPiUKICBzZWxlY3QoLWMoTEVNTUEsIFNVQlNFVCwgTkVUX1dJTkRPV19EQVRFUywgU0tJUCwgU1RBTVAsIE5ST1dTKSkKICAKY29yLnRlc3QoZGZfY29ycl9mdWxsJFVTRVMsIGRmX2NvcnJfZnVsbCRDRU5UX0RFR1JFRSkKYGBgCgoKIyMgRGVncmVlIGNlbnRyYWxpdHkgdnMuIGNvbW11bml0aWVzCgojIyMgQ29ycmVsYXRpb24KCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2xhc3QnKSAlPiUKICBzZWxlY3QoQ0VOVF9ERUdSRUUsIENPTU1VTklUSUVTKSAlPiUKICBtdXRhdGUoQ09NTVVOSVRJRVMgPSBhcy5udW1lcmljKENPTU1VTklUSUVTKSkgJT4lCiAgY29ycmVsYXRlKCkKYGBgCgoKIyMjIFBsb3QKCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2xhc3QnKSAlPiUKICBzZWxlY3QoTEVNTUEsIENFTlRfREVHUkVFLCBDT01NVU5JVElFUykgJT4lCiAgZ2dwbG90KC4sIGFlcyh4PUNFTlRfREVHUkVFLCB5PWFzLm51bWVyaWMoQ09NTVVOSVRJRVMpKSkgKwogICAgZ2VvbV90ZXh0KGFlcyhsYWJlbD1MRU1NQSkpICsKICAgIHNjYWxlX3hfY29udGludW91cyh0cmFucz0nbG9nJykKYGBgCgoKCiMjIFVzZXMgdnMuIHVzZXJzCgojIyMgUGxvdAoKYGBge3J9CnBsdCA8LSBkZl9jb21wICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2Z1bGwnKSAlPiUKICBzZWxlY3QoTEVNTUEsIFVTRVMsIFVTRVJTKSAlPiUKICBnZ3Bsb3QoLiwgYWVzKHg9VVNFUlMsIHk9VVNFUykpICsKICAgIGdlb21fdGV4dChhZXMobGFiZWw9TEVNTUEpKSArCiAgICBzY2FsZV94X2NvbnRpbnVvdXModHJhbnM9J2xvZycpICsKICAgIHNjYWxlX3lfY29udGludW91cyh0cmFucz0nbG9nJykgKwogICAgZ2VvbV9zbW9vdGgobWV0aG9kPWxtKQpnZ3Bsb3RseShwbHQpCmBgYAoKIyMjIENvcnJlbGF0aW9uCgpgYGB7cn0KZGZfY29tcCAlPiUKICBmaWx0ZXIoU1VCU0VUID09ICdmdWxsJykgJT4lCiAgc2VsZWN0KFVTRVMsIFVTRVJTKSAlPiUKICBjb3JyZWxhdGUoKQpgYGAKCgojIyBDb2VmZmljaWVudCBvZiB2YXJpYXRpb24KCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcigKICAgIFNVQlNFVCA9PSAnZnVsbCcsCiAgICBVU0VTID49IDEwMDAKICAgICkgJT4lCiAgc2VsZWN0KExFTU1BLCBVU0VTLCBDT0VGX1ZBUikgJT4lCiAgYXJyYW5nZShkZXNjKENPRUZfVkFSKSkKYGBgCgoKIyMgUHJvY2Vzc2luZyBzdGF0dXMKCiMjIyBMZW1tYSBsaXN0CgpgYGB7cn0KZGZfY29tcCAlPiUKICBzZWxlY3QoTEVNTUEsIFNVQlNFVCwgU1RBTVApICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2Z1bGwnKSAlPiUKICBtdXRhdGUoU1RBTVAgPSBhc19kYXRldGltZShTVEFNUCkpICU+JQogIGFycmFuZ2UoZGVzYyhTVEFNUCkpCmBgYAoKCiMjIyBEYXRhc2V0IHN0YXRpc3RpY3MKCmBgYHtyfQpkZl9jb21wICU+JQogIGZpbHRlcihTVUJTRVQgPT0gJ2Z1bGwnKSAlPiUKICBzZWxlY3QoTEVNTUEsIFNVQlNFVCwgVVNFUywgVVNFUlMpICU+JQogIGRwbHlyOjpzdW1tYXJpc2UoCiAgICBVU0VTX1RPVCA9IHN1bShVU0VTKSwKICAgIFVTRVJTX1RPVCA9IHN1bShVU0VSUykKICAgICkKYGBgCgoKIyBDT0VGX1ZBUiB2cy4gQ0VOVAoKYGBge3J9CmRmX2NvbXAgJT4lCiAgZmlsdGVyKFNVQlNFVCA9PSAnZnVsbCcpICU+JQogIHNlbGVjdChMRU1NQSwgQ09FRl9WQVIsIENFTlRfREVHUkVFKSAlPiUKICBnZ3Bsb3QoLiwgYWVzKHk9Q09FRl9WQVIsIHg9Q0VOVF9ERUdSRUUpKSArCiAgICBnZW9tX3RleHQoYWVzKGxhYmVsPUxFTU1BKSkgKwogICAgc2NhbGVfeV9jb250aW51b3VzKHRyYW5zPSdsb2cnKQpgYGAKCgojIENvcnJlbGF0aW9uczogRURBCgpgYGB7cn0KbGlicmFyeShIbWlzYykKCmRmX2NvcnIgPC0gZGZfY29tcCAlPiUKICAjIGZpbHRlcihTVUJTRVQgPT0gJ2xhc3QnKSAlPiUKICBzZWxlY3QoLWMoTEVNTUEsIFNVQlNFVCwgTkVUX1dJTkRPV19EQVRFUywgU0tJUCwgU1RBTVAsIE5ST1dTKSkKICAjIHNlbGVjdCgtYyhVU0VSUywgQUdFKSkgJT4lCiAgIyBtdXRhdGUoRk9DVVMgPSBVU0VTKSAlPiUKICAjIGZvY3VzKEZPQ1VTKSAlPiUKICAjIGdncGxvdCguLCBhZXMocmVvcmRlcihyb3duYW1lLCBGT0NVUyksIEZPQ1VTKSkgKwogICAgIyBnZW9tX2NvbCgpICsKICAgICMgY29vcmRfZmxpcCgpCiAgIyByZWFycmFuZ2UoKSAlPiUKICAjIHNoYXZlKCkgJT4lCiAgIyBycGxvdCgpCiAgIyBuZXR3b3JrX3Bsb3QobWluX2Nvcj0uNSkgJT4lCgogIApgYGAKCgogIA==